del data\output_*.*
ocrmypdf -l chi_sim --tesseract-oem 1 --force-ocr --tesseract-pagesegmode 6 data\input_3.pdf data\output_2.pdf
python extract_txt_from_pdf.py data\output_2.pdf data\output_3.txt
rightTxt.exe --command="right-txt" --path="data\output_3.txt" --language="chinese" --outPath="data\output_4.txt"
python sub_pdf_to_web_server.py data\input_1.pdf data\output_4.txt data\output_4.txtdesp.txt